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<210> 1 

<211> 4307 

<212> DNA 

<213> Human immunodeficiency virus type 1 



<400> 1 

atgggtgcga 

ttaaggccag 

ctagaacgat 

ctgggacagc 

acagtagcaa 

ttagacaaga 

gacacaggac 

caaatggtac 

gagaaggctt 

ccacaagatt 

ttaaaagaga 

gggcctattg 

agtacccttc 

atttataaaa 

agcattctgg 

tataaaactc 

ttgttggtcc 

gctacactag 

agagttttgg 

ggcaatttta 

acagccagaa 

caccaaatga 

tacaagggaa 

gagagcttca 

aaggaactgt 

taaagatagg 

tagaagaaat 

ttatcaaagt 

gtacagtatt 

ttggttgcac 



gagcgtcagt 
ggggaaagaa 
tcgcagttaa 
tacaaccatc 
ccctctattg 
tagaggaaga 
acagcaatca 
atcaggccat 
tcagcccaga 
taaacaccat 
ccatcaatga 
caccaggcca 
aggaacaaat 
gatggataat 
acataagaca 
taagagccga 
aaaatgcgaa 
aagaaatgat 
ctgaagcaat 
ggaaccaaag 
attgcagggc 
aagattgtac 
ggccagggaa 
ggtctggggt 
atcctttaac 
ggggcaacta 
gagtttgcca 
aagacagtat 
agtaggacct 
tttaaatttt 



attaagcggg 
aaaatataaa 
tcctggcctg 
ccttcagaca 
tgtgcatcaa 
gcaaaacaaa 
ggtcagccaa 
atcacctaga 
agtgataccc 
gctaaacaca 
ggaagctgca 
gatgagagaa 
aggatggatg 
cctgggatta 
aggaccaaag 
gcaagcttca 
cccagattgt 
gacagcatgt 
gagccaagta 
aaagattgtt 
ccctaggaaa 
tgagagacag 
ttttcttcag 
agagacaaca 
ttccctcagg 
aaggaagctc 
ggaagatgga 
gatcagatac 
acacctgtca 
cccattagcc 



ggagaattag 
ttaaaacata 
ttagaaacat 
ggatcagaag 
aggatagaga 
agtaagaaaa 
aattacccta 
actttaaatg 
atgttttcag 
gtggggggac 
gaatgggata 
ccaaggggaa 
acaaataatc 
aataaaatag 
gaacccttta 
caggaggtaa 
aagactattt 
cagggagtag 
acaaattcag 
aagtgtttca 
aagggctgtt 
gctaattttt 
agcagaccag 
actccccctc 
tcactctttg 
tattagatac 
aaccaaaaat 
tcatagaaat 
acataattgg 
ctattgagac 



atcgatggga 
tagtatgggc 
cagaaggctg 
aacttagatc 
taaaagacac 
aagcacagca 
tagtgcagaa 
catgggtaaa 
cattatcaga 
atcaagcagc 
gagtgcatcc 
gtgacatagc 
cacctatccc 
taagaatgta 
gagactatgt 
aaaattggat 
taaaagcatt 
gaggacccgg 
ctaccataat 
attgtggcaa 
ggaaatgtgg 
tagggaagat 
agccaacagc 
agaagcagga 
gcaacgaccc 
aggagcagat 
gataggggga 
ctgtggacat 
aagaaatctg 
tgtaccagta 



aaaaattcgg 
aagcagggag 
tagacaaata 
attatataat 
caaggaagct 
agcagcagct 
catccagggg 
agtagtagaa 
aggagccacc 
catgcaaatg 
agtgcatgca 
aggaactact 
agtaggagaa 
tagccctacc 
agaccggttc 
gacagaaacc 
gggaccagcg 
ccataaggca 
gatgcagaga 
agaagggcac 
aaaggaagga 
ctggccttcc 
cccaccagaa 
gccgatagac 
ctcgtcacaa 
gatacagtat 
attggaggtt 
aaagctatag 
ttgactcaga 
aaattaaagc 



60 

120 

180 

240 

300 

360 

420 

480 

540 

600 

660 

720 

780 

840 

900 

960 

1020 

1080 

1140 

1200 

1260 

1320 

1380 

1440 

1500 

1560 

1620 

1680 

1740 

1800 



caggaatgga 
tagtagaaat 
atccatacaa 
tagtagattt 
taccacatcc 
catatttttc 
gtataaacaa 
aaggatcacc 
aaaatccaga 
aaatagggca 
ttaccacacc 
tccatcctga 
tcaatgacat 
ttaaagtaag 
cactaacaga 
tacatggagt 
aaggccaatg 
atgcaagaat 
aaataaccac 
aaaaggaaac 
gggagtttgt 
tagtaggagc 
aagcaggata 
atcagaagac 
acatagtaac 
aatcagagtt 
catgggtacc 
ctggaatcag 
aatatcacag 
aagaaatagt 
tagactgtag 
tggtagcagt 
ggcaggaaac 
atactgacaa 
gaatcaagca 
tgaataaaga 
cagcagtaca 
acagtgcagg 
aaaaacaaat 
tttggaaagg 
atagtgacat 
agatggcagg 



tggcccaaaa 
ttgtacagag 
tactccagta 
cagagaactt 
cgcagggtta 
agttccctta 
tgagacacca 
agcaatattc 
catagttatc 
gcatagaaca 
agacaaaaaa 
taaatggaca 
acagaagtta 
gcaattatgt 
agaagcagag 
gtattatgac 
gacatatcaa 
gaggggtgcc 
agaaagcata 
atgggaaaca 
taatacccct 
agaaaccttc 
tgttactaat 
tgagttacaa 
agactcacaa 
agtcaatcaa 
agcacacaaa 
gaaagtacta 
taattggaga 
agccagctgt 
tccaggaata 
tcatgtagcc 
agcatatttt 
tggcagcaat 
ggaatttgga 
attaaagaaa 
aatggcagta 
ggaaagaata 
tacaaaaatt 
accagcaaag 
aaaagtagtg 
tgatgattgt 



gttaaacaat 
atggaaaagg 
tttgccataa 
aataagagaa 
aaaaagaaaa 
gatgaagact 
gggattagat 
caaagtagca 
tatcaataca 
aaaatagagg 
catcagaaag 
gtacagccta 
gtggggaaat 
aaactcctta 
ctagaactgg 
ccatcaaaag 
atttatcaag 
cacactaatg 
gtaatatggg 
tggtggacag 
cccttagtga 
tatgtagatg 
agaggaagac 
gcaatttatc 
tatgcattag 
ataatagagc 
ggaattggag 
tttttagatg 
gcaatggcta 
gataaatgtc 
tggcaactag 
agtggatata 
cttttaaaat 
ttcaccggtg 
attccctaca 
attataggac 
ttcatccaca 
gtagacataa 
caaaattttc 
ctcctctgga 
ccaagaagaa 
gtggcaagta 



ggccattgac 
aagggaaaat 
agaaaaaaga 
ctcaagactt 
aatcagtaac 
tcaggaagta 
atcagtacaa 
tgacaaaaat 
tggatgattt 
agctgagaca 
aacctccatt 
tagtgctgcc 
tgaattgggc 
gaggaaccaa 
cagaaaacag 
acttaatagc 
agccatttaa 
atgtaaaaca 
gaaagactcc 
agtattggca 
aattatggta 
gggcagctaa 
aaaaagttgt 
tagctttgca 
gaatcattca 
agttaataaa 
gaaatgaaca 
gaatagataa 
gtgattttaa 
agctaaaagg 
attgtacaca 
tagaagcaga 
tagcaggaag 
ctacggttag 
atccccaaag 
aggtaagaga 
attttaaaag 
tagcaacaga 
gggtttatta 
aaggtgaagg 
aagcaaagat 
gacaggatga 



agaagaaaaa 
ttcaaaaatt 
cagtactaaa 
ctgggaagtt 
agtactggat 
tactgcattt 
tgtgcttcca 
cttagagcct 
gtatgtagga 
acatctgttg 
cctttggatg 
agaaaaagac 
aagtcagatt 
agcactaaca 
agagattcta 
agaaatacag 
aaatctgaaa 
attaacagag 
taaatttaaa 
agccacctgg 
ccagttagag 
cagggagact 
caccctaact 
ggattcggga 
agcacaacca 
aaaggaaaag 
agtagataaa 
ggcccaagat 
cctgccacct 
agaagccatg 
tttagaagga 
agttattcca 
atggccagta 
ggccgcctgt 
tcaaggagta 
tcaggctgaa 
aaaagggggg 
catacaaact 
cagggacagc 
ggcagtagta 
cattagggat 
ggattag 



ataaaagcat 
gggcctgaaa 
tggagaaaat 
caattaggaa 
gtgggtgatg 
accataccta 
cagggatgga 
tttagaaaac 
tctgacttag 
aggtggggac 
ggttatgaac 
agctggactg 
tacccaggga 
gaagtaatac 
aaagaaccag 
aagcaggggc 
acaggaaaat 
gcagtgcaaa 
ctgcccatac 
attcctgagt 
aaagaaccca 
aaattaggaa 
gacacaacaa 
ttagaagtaa 
gatcaaagtg 
gtctatctgg 
ttagtcagtg 
gaacatgaga 
gtagtagcaa 
catggacaag 
aaagttatcc 
gcagaaacag 
aaaacaatac 
tggtgggcgg 
gtagaatcta 
catcttaaga 
attggggggt 
aaagaattac 
agaaattcac 
atacaagata 
tatggaaaac 



1860 
1920 
1980 
2040 
2100 
2160 
2220 
2280 
2340 
2400 
2460 
2520 
2580 
2640 
2700 
2760 
2820 
2880 
2940 
3000 
3060 
3120 
3180 
3240 
3300 
3360 
3420 
3480 
3540 
3600 
3660 
3720 
3780 
3840 
3900 
3960 
4020 
4080 
4140 
4200 
4260 
4307 



<210> 2 
<211> 4307 
<212> DNA 

<213> Artificial Sequence 
<220> 

<223> Description of Artificial Sequence: 

gagpol-SYNgp-codon optimised gagpol sequence 

<400> 2 

atgggcgccc gcgccagcgt gctgtcgggc ggcgagctgg accgctggga gaagatccgc 60 
ctgcgccccg gcggcaaaaa gaagtacaag ctgaagcaca tcgtgtgggc cagccgcgaa 12 0 
ctggagcgct tcgccgtgaa ccccgggctc ctggagacca gcgaggggtg ccgccagatc 180 
ctcggccaac tgcagcccag cctgcaaacc ggcagcgagg agctgcgcag cctgtacaac 24 0 



accgtggcca 
ctggataaaa 
gacaccggac 
cagatggtgc 
gagaaggctt 
ccccaagatc 
ctgaaggaga 
gggcccatcg 
agtacccttc 
atctacaaac 
agcatcctgg 
tacaaaacgc 
ctgctggtcc 
gctaccctag 
cgcgtcctgg 
ggcaactttc 
acagcccgca 
caccagatga 
tacaagggaa 
gagagcttca 
aaggaactgt 
taaagatagg 
tggaggagat 
tcatcaaggt 
gtaccgtgct 
tcggttgcac 
ccgggatgga 
tggtggagat 
acccgtacaa 

tggtggactt 

tcccgcaccc 
cctacttctc 
cgatcaacaa 
aaggctctcc 
agaaccccga 
agatagggca 
tgaccacacc 
tgcaccctga 
tcaacgacat 
ttaaggtgag 
ccctaaccga 
tgcacggcgt 
aaggccagtg 
acgcccggat 
agatcaccac 
agaaggaaac 
gggagttcgt 
tagtgggcgc 
aagccggata 
accagaagac 
acatcgtgac 
agtccgagct 
cctgggtacc 
ctggcatcag 
aataccacag 
aagagatcgt 
tggactgtag 
tggtagccgt 



cgctgtactg 
tcgaagagga 
acagcaacca 
accaggccat 
ttagcccgga 
tgaacaccat 
ccatcaatga 
caccgggcca 
aggaacagat 
gctggatcat 
acatccgcca 
tccgcgccga 
agaacgcgaa 
aggaaatgat 
ctgaggccat 
ggaaccaacg 
actgcagggc 
aagactgtac 
ggccagggaa 
ggtctggggt 
atcctttaac 
ggggcagctc 
gtcgttgcca 
gcgccagtat 
ggtgggcccc 
gctgaacttc 
cggcccgaag 
ttgcacagag 
cacgccggtg 
ccgcgagctg 
cgcagggctg 
cgttcccctg 
cgagacaccg 
cgcaatcttc 
catcgtcatc 
gcaccgcacc 
cgacaagaag 
caaatggacc 
acagaagctg 
gcagctgtgc 
ggaggccgag 
gtactatgac 
gacctatcag 
gaggggtgcc 
cgaaagcatc 
ctgggaaacc 
caacacccct 
cgaaaccttc 
cgtcactaac 
tgagctgcag 
agactctcag 
ggtcaatcag 
cgcccacaaa 
gaaggtgcta 
caactggcgg 
ggccagctgt 
ccccggcatc 
ccatgtggcc 



cgtccaccag 
acagaataag 
ggtcagccag 
ctccccccgc 
ggtgataccc 
gctcaacaca 
ggaggctgcc 
gatgcgtgag 
cggctggatg 
cctgggcctg 
aggcccgaag 
gcaggctagc 
cccggactgc 
gaccgcctgt 
gagccaggtg 
caagatcgtc 
ccctaggaaa 
tgagagacag 
ttttcttcag 
agagacaaca 
ttccctcaga 
aaggaggctc 
ggccgctgga 
gaccagatcc 
acacccgtca 
cccattagcc 
gtcaagcaat 
atggaaaagg 
ttcgcaatca 
aacaagcgca 
aagaagaaga 
gacgaagact 
gggattcgat 
cagagtagca 
tatcagtaca 
aagatcgagg 
caccagaagg 
gtgcagccta 
gtggggaagt 
aaactcctcc 
ctcgaactgg 
ccctccaagg 
atttaccagg 
cacactaacg 
gtgatctggg 
tggtggacag 
cccctggtga 
tacgtggatg 
cggggcagac 
gccatttacc 
tatgccctgg 
atcatcgagc 
ggcattggcg 
ttcctggatg 
gccatggcta 
gacaagtgtc 
tggcaactcg 
agtggctaca 



cgcatcgaaa 
agcaaaaaga 
aactacccca 
acgctgaacg 
atgttctcag 
gtggggggac 
gaatgggatc 
ccacggggct 
accaacaacc 
aacaagatcg 
gaaccctttc 
caggaggtga 
aagacgatcc 
cagggagtgg 
accaactccg 
aagtgcttca 
aagggctgct 
gctaattttt 
agcagaccag 
actccccctc 
tcactctttg 
tcctggacac 
agccgaagat 
tcatcgaaat 
acatcatcgg 
ctatcgagac 
ggccattgac 
aagggaaaat 
agaagaagga 
cgcaagactt 
aatccgtgac 
tcaggaagta 
atcagtacaa 
tgaccaaaat 
tggatgactt 
agctgcgcca 
agcctccctt 
tcgtgctgcc 
tgaactgggc 
gcggaaccaa 
cagaaaaccg 
acctgatcgc 
agcccttcaa 
acgtcaagca 
gaaagactcc 
agtattggca 
agctgtggta 
gggccgctaa 
agaaggttgt 
tcgctttgca 
gcatcattca 
agctgatcaa 
gcaatgagca 
gcatcgacaa 
gcgacttcaa 
agctcaaggg 
attgcaccca 
tcgaggccga 



tcaaggatac 
aggcccaaca 
tcgtgcagaa 
cctgggtgaa 
ccctgtcaga 
accaggccgc 
gtgtgcatcc 
cagacatcgc 
cacccatccc 
tgcgcatgta 
gcgactacgt 
agaactggat 
tgaaggccct 
gcggacccgg 
ctaccatcat 
actgtggcaa 
ggaaatgcgg 
tagggaagat 
agccaacagc 
agaagcagga 
gcaacgaccc 
cggagcagac 
gatcggggga 
ctgcggccac 
acgcaacctg 
ggtaccggtg 
agaggagaag 
ctccaagatt 
ctcgacgaaa 
ctgggaggtt 
cgtactggat 
cactgccttc 
cgtgctgccc 
cctggagcct 
gtacgtgggc 
gcacctgttg 
cctctggatg 
agagaaagac 
cagtcagatt 
ggcactcaca 
agagatccta 
cgagatccag 
gaacctgaag 
gctgaccgag 
taagttcaag 
ggccacctgg 
ccagctggag 
cagggagact 
caccctcact 
ggactcgggc 
agcccagcca 
gaaggaaaag 
ggtcgacaag 
ggcccaggac 
cctgccccct 
cgaagccatg 
tctggagggc 
ggtcattccc 



gaaagaggcc 
ggccgccgcg 
catccagggg 
ggtggtggaa 
gggagccacc 
catgcagatg 
ggtgcacgca 
cggaacgact 
ggtgggagaa 
tagccctacc 
ggaccggttc 
gaccgaaacc 
gggcccagcg 
ccacaaggca 
gatgcagcgc 
agaagggcac 
caaggaaggc 
ctggccttcc 
cccaccagaa 
gccgatagac 
ctcgtcacaa 
gacaccgtgc 
atcggcggtt 
aaggctatcg 
ttgacgcaga 
aagctgaagc 
atcaaggcac 
gggcctgaga 
tggcgcaagc 
cagctgggca 
gtgggtgatg 
acaatccctt 
cagggctgga 
ttccgcaaac 
tctgatctag 
aggtggggac 
ggttacgagc 
agctggactg 
tacccaggga 
gaggtgatcc 
aaggagcccg 
aagcaggggc 
accggcaagt 
gccgtgcaga 
ctgcccatcc 
attcctgagt 
aaggagccca 
aagctgggca 
gacaccacca 
ctggaggtga 
gaccagagtg 
gtctatctgg 
ctggtctcgg 
gagcacgaga 
gtggtggcca 
catggccagg 
aaggttatcc 
gccgaaacag 



300 

360 

420 

480 

540 

600 

660 

720 

780 

840 

900 

960 

1020 

1080 

1140 

1200 

1260 

1320 

1380 

1440 

1500 

1560 

1620 

1680 

1740 

1800 

1860 

1920 

1980 

2040 

2100 

2160 

2220 

2280 

2340 

2400 

2460 

2520 

2580 

2640 

2700 

2760 

2820 

2880 

2940 

3000 

3060 

3120 

3180 

3240 

3300 

3360 

3420 

3480 

3540 

3600 

3660 

3720 



ggcaggagac 
atactgacaa 
gaatcaagca 
tgaataagga 
ccgcggtcca 
acagtgcggg 
aaaagcagat 
tctggaaagg 
atagcgacat 
agatggcggg 



agcctacttc 
tggcagcaat 
ggagttcggg 
gttaaagaag 
aatggcggta 
ggagcggatc 
taccaagatt 
cccagcgaag 
caaggtggtg 
tgatgattgc 



ctcctgaagc 
ttcaccagtg 
atcccctaca 
attatcggcc 
ttcatccaca 
gtggacatca 
cagaatttcc 
ctcctctgga 
cccagaagaa 
gtggcgagca 



tggcaggccg 
ctacggttaa 
atccccagag 
aggtcagaga 
atttcaagcg 
tcgcgaccga 

gggtctacta 

agggtgaggg 
aggcgaagat 
gacaggatga 



gtggccagtg 
ggccgcctgc 
tcagggcgtc 
tcaggctgag 
gaaggggggg 
catccagact 
cagggacagc 
ggcagtagtg 
cattagggat 
ggattag 



aagaccatcc 
tggtgggcgg 
gtcgagtcta 
catctcaaga 
attggggggt 
aaggagctgc 
agaaatcccc 
atccaggata 
tatggcaaac 



3780 
3840 
3900 
3960 
4020 
4080 
4140 
4200 
4260 
4307 



<210> 3 

<211> 2571 

<212> DNA 

<213> Human immunodeficiency virus type 1 



<400> 3 

atgagagtga 

cttgggttat 

gtacctgtgt 

gatacagagg 

caagaagtag 

gaacagatgc 

ttaaccccac 

aatagtactg 

aactgctctt 

ctttataaac 

tgtaatacct 

cactattgtg 

aaaggatcat 

tcaactcaac 

aatttcactg 

tgtacaagac 

tatacaacaa 

aaatggaatg 

acaatagtct 

tgtggagggg 

aataatactt 

aaacaaatta 

ggacaaatta 

gacacggaca 

tggagaagtg 

accaaggcaa 

cttgggttct 

caggccagac 

gaggcgcaac 

gtcctggctg 

ggaaaactca 

gatgatattt 

agcttaatat 

ttattggaat 

tggtatataa 

gctgtacttt 

cgccccccag 

agagacagag 

ctgcggagcc 

attgtggaac 



aggggatcag 
taatgatctg 
ggaaagaagc 
tacataatgt 
aattggtaaa 
atgaggatat 
tctgtgttac 
ctaataacaa 
tcaatatcac 
ttgatatagt 
cagtcattac 
ccccggctgg 
gtaaaaatgt 
tgctgttaaa 
ataatgctaa 
ccaactacaa 
aaaatataat 
acactttaag 
ttaatcaatc 
aatttttcta 
ggaataatac 
taaacatgtg 
gatgttcatc 
cgaacgacac 
aattatataa 
agagaagagt 
taggagcagc 
tattattgtc 
agcatatgtt 
tggaaagata 
tttgcaccac 
ggaataacat 
actcattact 
tggataaatg 
aaatattcat 
ctatagtgaa 
ttccgagggg 
acacatccgg 
tgttcctctt 
ttctgggacg 



gaggaattat 
tagtgctaca 
aaccaccact 
ttgggccaca 
tgtgacagaa 
aatcagttta 
tttaaattgc 
tagtaatagc 
cacaagcata 
atcaatagat 
acaagcttgt 
ttttgcgatt 
cagcacagta 
tggcagtcta 
aaccatcata 
taaaagaaaa 
aggaactata 
acagatagtt 
ctcaggaggg 
ctgtaataca 
tacagggtca 
gcaggaagta 
aaatattaca 
cgagatcttc 
atataaagta 
ggtgcagaga 
aggaagcact 
tggtatagtg 
gcaactcaca 
cctaaaggat 
tactgtgcct 
gacctggatg 
agaaaaatcg 
ggcaagtttg 
aatgatagta 
tagagttagg 
acccgacagg 
tcgattagtg 
cagctaccac 
cagggggtgg 



cagcactggt 
gaaaaattgt 
ctattttgtg 
caagcctgtg 
aattttaaca 
tgggatcaaa 
actgatttga 
gagggaacaa 
agagataaga 
aatgatagta 
ccaaagatat 
ctaaaatgta 
caatgtacac 
gcagaagaag 
gtacatctga 
aggatacata 
agacaagcac 
agcaaattaa 
gacccagaaa 
tcaccactgt 
aataacaata 
ggaaaagcaa 
gggctactat 
agacctggag 
gtaacaattg 
gaaaaaagag 
atgggcgcag 
caacagcaga 
gtctggggca 
caacagctcc 
tggaatgcta 
cagtgggaaa 
caaacccaac 
tggaattggt 
ggaggcttgg 
cagggatact 
cccgaaggaa 
catggattct 
cacagagact 
gaagtcctca 



ggggatgggg 
gggtcacagt 
catcagatgc 
tacccacaga 
tgtggaaaaa 
gcctaaagcc 
ggaatactac 
taaagggagg 
tgcagaaaga 
ccagctatag 
cctttgagcc 
acgataaaaa 
atggaattag 
aggtagtaat 
atgaatctgt 
taggaccagg 
attgtaacat 
aagaacaatt 
ttgtaatgca 
ttaatagtac 
tcacacttca 
tgtatgcccc 
taacaagaga 
gaggagatat 
aaccattagg 
cagcgatagg 
cgtcagtgac 
acaatttgct 
tcaagcagct 
tggggttttg 
gttggagtaa 
gagaaattga 
aagaaaagaa 
ttgacataac 
taggtttaag 
caccattgtc 
tcgaagaaga 
tagcaattat 
tactcttgat 
aatattggtg 



cacgatgctc 
ctattatggg 
taaagcatat 
ccccaaccca 
taacatggta 
atgtgtaaaa 
taataccaat 
agaaatgaaa 
atatgcactt 
gttgataagt 
aattcccata 
gttcagtgga 
gccagtagta 
tagatctgag 
acaaattaat 
gagagcattt 
tagtagagca 
taagaataaa 
cagttttaat 
ttggaatggt 
atgcaaaata 
tcccattgaa 

tggtggtaag 

gagggacaat 
agtagcaccc 
agctctgttc 
gctgacggta 
gagggccatt 
ccaggcaaga 

gggttgctct 

taaatctctg 
caattacaca 
tgaacaagaa 
aaattggctg 
aatagttttt 
gttgcagacc 
aggtggagag 
ctgggtcgac 
tgcagcgagg 
gaatctccta 



60 

120 

180 

240 

300 

360 

420 

480 

540 

600 

660 

720 

780 

840 

900 

960 

1020 

1080 

1140 

1200 

1260 

1320 

1380 

1440 

1500 

1560 

1620 

1680 

1740 

1800 

1860 

1920 

1980 

2040 

2100 

2160 

2220 

2280 

2340 

2400 



cagtattgga gtcaggaact aaagagtagt gctgttagct tgcttaatgc cacagctata 2460 
gcagtagctg aggggacaga tagggttata gaagtactgc aaagagctgg tagagctatt 252 0 
ctccacatac ctacaagaat aagacagggc ttggaaaggg ctttgctata a 2571 



<210> 4 

<211> 2571 

<212> DNA 

<213> Artificial Sequence 
<220> 

<223> Description of Artificial Sequence: 

SYNgp-160mn-codon optimised env sequence 



<400> 4 

atgagggtga 

ctggggctgc 

gtgcccgtgt 

gacaccgagg 

caggaggtgg 

gagcagatgc 

ctgacccccc 

aacagcaccg 

aactgcagct 

ctgtacaagc 

tgcaacacca 

cactactgcg 

aagggcagct 

agcacccagc 

aacttcaccg 

tgcacgcgtc 

tacaccacca 

aagtggaacg 

accatcgtgt 

tgcggcggcg 

aacaacacct 

aagcagatca 

ggccagatcc 

gacaccgaca 

tggagatctg 

accaaggcca 

ctgggcttcc 

caggcccgcc 

gaggcccagc 

gtgctggccg 

ggcaagctga 

gacgacatct 

agcctgatct 

ctgctggagc 

tggtacatca 

gccgtgctga 

cggccccccg 

cgcgaccgcg 

ctccgcagcc 

atcgtggaac 

cagtattgga 

gccgtggccg 

ctgcacatcc 



aggggatccg 
tgatgatctg 
ggaaggaggc 
tgcacaacgt 
agctcgtgaa 
atgaggacat 
tgtgcgtgac 
ccaacaacaa 
tcaacatcac 
tggatatcgt 
gcgtgatcac 
cccccgccgg 
gcaagaacgt 
tcctgctgaa 
acaacgccaa 
ccaactacaa 
agaacatcat 
acaccctgcg 
tcaaccagag 
aattcttcta 
ggaacaacac 
tcaacatgtg 
ggtgcagcag 
ccaacgacac 
agctgtacaa 
agcgccgcgt 
tgggggcggc 
tgctcctgag 
agcatatgct 
tggagcgcta 
tctgcaccac 
ggaacaacat 
acagcctgct 
tggacaagtg 
aaatcttcat 
gcatcgtgaa 
tgccgcgcgg 
acaccagcgg 
tgttcctgtt 
tcctaggccg 
gccaggagct 
a gggcaccga 
ccacccgcat 



ccgcaactac 
cagcgccacc 
caccaccacc 
gtgggccacc 
cgtgaccgag 
catcagcctg 
cctgaactgc 
cagcaacagc 
caccagcatc 
gagcatcgac 
ccaggcctgc 
cttcgccatc 
gagcaccgtg 
cggcagcctg 
gaccatcatc 
caagcgcaag 
cggcaccatc 
ccagatcgtg 
cagcggcggc 
ctgcaacacc 
caccggcagc 
gcaggaggtg 
caacatcacc 
cgaaatcttc 
gtacaaggtg 
ggtgcagcgc 
gggcagcacc 
cggcatcgtg 
ccagctcacc 
cctgaaggac 
cacggtaccc 
gacctggatg 
ggagaagagc 
ggcgagcctg 
catgattgtg 
ccgcgtgcgc 
gcccgaccgc 
caggctcgtg 
cagctaccac 
ccgcggctgg 
gaagtccagc 
ccgcgtgatc 
ccgccagggg 



cagcactggt 
gagaagctgt 
ctgttctgcg 
caggcgtgcg 
aacttcaaca 
tgggaccaga 
accgacctga 
gagggcacca 
cgcgacaaga 
aacgacagca 
cccaagatca 
ctgaagtgca 
cagtgcaccc 
gccgaggagg 
gtgcacctga 
cgcatccaca 
cgccaggccc 
agcaagctga 
gaccccgaga 
agccccctgt 
aacaacaata 
ggcaaggcca 
ggtctgctgc 
cgccccggcg 
gtgacgatcg 
gagaagcggg 
atgggggccg 
cagcagcaga 
gtgtggggca 
cagcagctcc 
tggaacgcct 
cagtgggagc 
cagacccagc 
tggaactggt 
ggcggcctgg 
cagggctaca 
cccgagggca 
cacggcttcc 
caccgcgacc 
gaggtgctga 
gccgtgagcc 
gaggtgctcc 
ctcgagaggg 



ggggctgggg 
gggtgaccgt 
ccagcgacgc 
tgcccaccga 
tgtggaagaa 
gcctgaagcc 
ggaacaccac 
tcaagggcgg 
tgcagaagga 
ccagctaccg 
gcttcgagcc 
acgacaagaa 
acggcatccg 
aggtggtgat 
atgagagcgt 
tcggccccgg 
actgcaacat 
aggagcagtt 
tcgtgatgca 
tcaacagcac 
ttaccctcca 
tgtacgcccc 
tgacccgcga 
gcggcgacat 
agcccctggg 
ccgccatcgg 
ccagcgtgac 
acaacctcct 
tcaagcagct 
tgggcttctg 

cctggagcaa 
gcgagatcga 
aggagaagaa 
tcgacatcac 
tgggcctccg 
gccccctgag 
tcgaggagga 
tggcgatcat 
tgctgctgat 
agtactggtg 
tgctgaacgc 
agagggccgg 

cgctgctgta 



cacgatgctc 
gtactacggc 
caaggcgtac 
cccca'acccc 
caacatggtg 
ctgcgtgaag 
caacaccaac 
cgagatgaag 
gtacgccctg 
cctgatctcc 
catccccatc 
gttcagcggc 
gccggtggtg 
ccgcagcgag 
gcagatcaac 
gcgcgccttc 
ctctagagcc 
caagaacaag 
cagcttcaac 
ctggaacggc 
gtgcaagatc 
ccccatcgag 
cggcggcaag 
gcgcgacaac 
cgtggccccc 
cgccctgttc 
cctgaccgtg 
ccgcgccatc 
ccaggcccgc 
gggctgctcc 
caagagcctg 
taactacacc 
cgagcaggag 
caactggctg 
catcgtgttc 
cctccagacc 
gggcggcgag 
ctgggtcgac 
cgccgcccgc 
gaacctcctc 
caccgccatc 
gagggcgatc 
a 



60 

120 

180 

240 

300 

360 

420 

480 

540 

600 

660 

720 

780 

840 

900 

960 

1020 

1080 

1140 

1200 

1260 

1320 

1380 

1440 

1500 

1560 

1620 

1680 

1740 

1800 

1860 

1920 

1980 

2040 

2100 

2160 

2220 

2280 

2340 

2400 

2460 

2520 

2571 



<210> 5 

<211> 116 

<212> DNA 

<213> Artificial Sequence 
<220> 

<223> Description of Artificial Sequence: Synthetic 
oligonucleotide 

<400> 5 

tcgagcccgg ggatgacgtc atcgacttcg aaggttcgaa tccttctact gccaccattt 6 
tttctctacg tcatcgactt cgaaggttcg aatccttccc tgtccaccag tcgacc 1 



<210> 6 
<211> 110 
<212> DNA 

<213> Artificial Sequence 
<220> 

<223> Description of Artificial Sequence: Synthetic 
oligonucleotide 

<400> 6 

tcgagtatta cgtcatcgac ttcgaaggtt cgaatccttc tagattcacc attttttagg 6 
aacgtcatcg acttcgaagg ttcgaatcct tccagttcca ccagtcgacc 1 



<210> 7 
<211> 110 
<212> DNA 

<213> Artificial Sequence 
<220> 

<223> Description of Artificial Sequence: Synthetic 
oligonucleotide 

<400> 7 

tcgaggccaa cgtcatcgac ttcgaaggtt cgaatccttc tcttcccacc attttttttc 6 
cacgtcatcg acttcgaagg ttcgaatcct tcggggccca ccagtcgacc 1 



<210> 8 
<211> 110 
<212> DNA 

<213> Artificial Sequence 
<220> 

<223> Description of Artificial Sequence: Synthetic 
oligonucleotide 

<400> 8 

tcgagggcta cgtcatcgac ttcgaaggtt cgaatccttc ttgcttcacc attttttctg 6 
aacgtcatcg acttcgaagg ttcgaatcct tctgctgtca ccagtcgacc 1 



7 



<210> 9 

<211> 110 

<212> DNA 

<213> Artificial Sequence 
<220> 

<223> Description of Artificial Sequence: Synthetic 
oligonucleotide 

<400> 9 

tcgagtataa cgtcatcgac ttcgaaggtt cgaatccttc accggtcacc atttttttat 60 
aacgtcatcg acttcgaagg ttcgaatcct tcttcttaca ccagtcgacc 110 



<210> 10 

<211> 116 

<212> DNA 

<213> Artificial Sequence 



Q 



<220> 

<223> Description of Artificial Sequence: Synthetic 
oligonucleotide 



<400> 10 

tcgaggtaca cgtcatcgac ttcgaaggtt cgaatccttc gtagttcacc attttttgtg 60 
cacgtcatcg acttcgaagg ttcgaatcct tctaggccca ccagtcgacg catgcc 116 



ru 



<210> 11 

<211> 8560 

<212> DNA 

<213> Artificial Sequence 
<220> 

<223> Description of Artificial Sequence: Synthetic 
nucleotide pH4DOZENEGS sequence 



<400> 11 

ctgacgcgcc 

ccgctacact 

ccacgttcgc 

ttagtgcttt 

ggccatcgcc 

gtggactctt 

tataagggat 

ttaacgcgaa 

caactgttgg 

gggatgtgct 

taaaacgacg 

ccgcggtggc 

gaccgcccaa 

caatagggac 

cagtacatca 

ggcccgcctg 

tctacgtatt 

gtggatagcg 

gtttgttttg 

tgacgcaaat 



ctgtagcggc 
tgccagcgcc 
cggctttccc 
acggcacctc 
ctgatagacg 
gttccaaact 
tttgccgatt 
ttttaacaaa 
gaagggcgat 
gcaaggcgat 
gccagtgagc 
ggccgctcta 
cgacccccgc 
tttccattga 
agtgtatcat 
gcattatgcc 
agtcatcgct 
gtttgactca 
gcaccaaaat 
gggcggtagg 



gcattaagcg 
ctagcgcccg 
cgtcaagctc 
gaccccaaaa 
gtttttcgcc 
ggaacaacac 
tcggcctatt 
atattaacgc 
cggtgcgggc 
taagttgggt 
gcgcgtaata 
gagtccgtta 
ccattgacgt 
cgtcaatggg 
atgccaagta 
cagtacatga 
attaccatgg 
cggggatttc 
caacgggact 
cgtgtacggt 



cggcgggtgt 
ctcctttcgc 
taaatcgggg 
aacttgatta 
ctttgacgtt 
tcaaccctat 
ggttaaaaaa 
ttacaatttc 
ctcttcgcta 
aacgccaggg 
cgactcacta 
cataacttac 
caataatgac 
tggagtattt 
cgccccctat 
ccttatggga 
tgatgcggtt 
caagtctcca 
ttccaaaatg 
gggaggtcta 



ggtggttacg 

tttcttccct 
gctcccttta 
gggtgatggt 
ggagtccacg 
ctcggtctat 
tgagctgatt 
cattcgccat 
ttacgccagc 
ttttcccagt 
tagggcgaat 
ggtaaatggc 
gtatgttccc 
acggtaaact 
tgacgtcaat 
ctttcctact 
ttggcagtac 
ccccattgac 
tcgtaacaac 
tataagcaga 



cgcagcgtga 
tcctttctcg 
gggttccgat 
tcacgtagtg 
ttctttaata 
tcttttgatt 
taacaaaaat 
tcaggctgcg 
tggcgaaagg 
cacgacgttg 
tggagctcca 
ccgcctggct 
atagtaacgc 
gcccacttgg 
gacggtaaat 
tggcagtaca 
atcaatgggc 
gtcaatggga 
tccgccccat 
gctcgtttag 



60 

120 

180 

240 

300 

360 

420 

480 

540 

600 

660 

720 

780 

840 

900 

960 

1020 

1080 

1140 

1200 



8 



tgaaccggtc tctctggtta gaccagatct gagcctggga gctctctggc taactaggga 1260 
acccactgct taagcctcaa taaagcttgc cttgagtgct tcaagtagtg tgtgcccgtc 1320 
tgttgtgtga ctctggtaac tagagatccc tcagaccctt ttagtcagtg tggaaaatct 1380 
ctagcagtgg cgcccgaaca gggacttgaa agcgaaaggg aaaccagagg agctctctcg 1440 
acgcaggact cggcttgctg aagcgcgcac ggcaagaggc gaggggcggc gactggtgag 1500 
tacgccaaaa attttgacta gcggaggcta gaaggagaga gatgggtgcg agagcgtcag 1560 
tattaagcgg gggagaatta gatcgcgatg ggaaaaaatt cggttaaggc cagggggaaa 162 0 
gaaaaaatat aaattaaaac atatagtatg ggcaagcagg gagctagaac gattcgcagt 1680 
taatcctggc ctgttagaaa catcagaagg ctgtagacaa atactgggac agctacaacc 1740 
atcccttcag acaggatcag aagaacttag atcattatat aatacagtag caaccctcta 1800 
ttgtgtgcat caaaggttga gataaaagac accaaggaag ctttagacaa gatagaggga 1860 
gagcaaaaca aaagtaagaa aaaagcacag caagcagcag ctgacacagg acacagcaat 192 0 
caggtcagcc aaaattaccc tatagtgcag aacatccagg ggcaaatggt acatcaggcc 1980 
atatcaccta gaactttaaa tgcatgggta aaagtagtag aagagaaggc tttcagccca 2040 
gaagtgatac ccatgttttc agcattatca gaaggagcca ccccacaaga tttaaacacc 2100 
atgctaaaca cagtgggggg acatcaagca gccatgcaaa tgttaaaaga gaccatcaat 2160 
gaggaagctg caggaattcg cctaaaactg cttgtaccaa ttgctattgt aaaaagtgtt 2220 
gctttcattg ccaagtttgt ttcataacaa aagccttagg catctcctat ggcaggaaga 22 80 
agcggagaca gcgacgaaga gctcatcaga acagtcagac tcatcaagct tctctatcaa 2340 
agcagtaagt agtacatgta acgcaaccta taccaatagt agcaatagta gcattagtag 2400 
tagcaataat aatagcaata gttgtgtggt ccatagtaat catagaatat aggaaaatat 2460 
taagacaaag aaaaatagac aggttaattg atagactaat agaaagagca gaagacagtg 252 0 
gcaatgagag tgaaggagaa atatcagcac ttgtggagat gggggtggag atggggcacc 258 0 
atgctccttg ggatgttgat gatctgtagt gctacagaaa aattgtgggt cacagtctat 2640 
tatggggtac ctgtgtggaa ggaagcaacc accactctat tttgtgcatc agatgctaaa 2700 
gcatagatct tcagacttgg aggaggagat atgagggaca attggagaag tgaattatat 2 760 
aaatataaag tagtaaaaat tgaaccatta ggagtagcac ccaccaaggc aaagagaaga 2 82 0 
gtggtgcaga gagaaaaaag agcagtggga ataggagctt tgttccttgg gttcttggga 2880 
gcagcaggaa gcactatggg cgcagcgtca atgacgctga cggtacaggc cagacaatta 2 94 0 
ttgtctggta tagtgcagca gcagaacaat ttgctgaggg ctattgaggc gcaacagcat 3000 
ctgttgcaac tcacagtctg gggcatcaag cagctccagg caagaatcct ggctgtggaa 3060 
agatacctaa aggatcaaca gctcctgggg atttggggtt gctctggaaa actcatttgc 3120 
accactgctg tgccttggaa tgctagttgg agtaataaat ctctggaaca gatctggaat 3180 
cacacgacct ggatggagtg ggacagagaa attaacaatt acacaagctt aatacactcc 3240 
ttaattgaag aatcgcaaaa ccagcaagaa aagaatgaac aagaattatt ggaattagat 3300 
aaatgggcaa gtttgtggaa ttggtttaac ataacaaatt ggctgtggta tataaaatta 3360 
ttcataatga tagtaggagg cttggtaggt ttaagaatag tttttgctgt actttctata 3420 
gtgaatagag ttaggcaggg atattcacca ttatcgtttc agacccacct cccaaccccg 3480 
aggggacccg acaggcccga aggaatagaa gaagaaggtg gagagagaga cagagacaga 3 54 0 
tccattcgat tagtgaacgg atccttggca cttatctggg acgatctgcg gagcctgtgc 3600 
ctcttcagct accaccgctt gagagactta ctcttgattg taacgaggat tgtggaactt 3660 
ctgggacgca gggggtggga agccctcaaa tattggtgga atctcctaca gtattggagt 3 72 0 
caggaactaa agaatagtgc tgttagcttg ctcaatgcca cagccatagc agtagctgag 3780 
gggacagata gggttataga agtagtacaa ggagcttgta gagctattcg ccacatacct 3840 
agaagaataa gacagggctt ggaaaggatt ttgctataag atgggtggca agtggtcaaa 3 900 
aagtagtgtg attggatggc ctactgtaag ggaaagaatg agacgagctg agccagcagc 3 960 
agatagggtg ggagcagcat ctcgacgctg caggagtggg gaggcacgat ggccgctttg 4 02 0 
gtcgaggcgg atccggccat tagccatatt attcattggt tatatagcat aaatcaatat 4080 
tggctattgg ccattgcata cgttgtatcc atatcataat atgtacattt atattggctc 4140 
atgtccaaca ttaccgccat gttgacattg attattgact agttattaat agtaatcaat 4200 
tacggggtca ttagttcata gcccatatat ggagttccgc gttacataac ttacggtaaa 4260 
tggcccgcct ggctgaccgc ccaacgaccc ccgcccattg acgtcaataa tgacgtatgt 4320 
tcccatagta acgccaatag ggactttcca ttgacgtcaa tgggtggagt atttacggta 43 80 
aactgcccac ttggcagtac atcaagtgta tcatatgcca agtacgcccc ctattgacgt 4440 
caatgacggt aaatggcccg cctggcatta tgcccagtac atgaccttat gggactttcc 4500 
tacttggcag tacatctacg tattagtcat cgctattacc atggtgatgc ggttttggca 4560 
gtacatcaat gggcgtggat agcggtttga ctcacgggga tttccaagtc tccaccccat 462 0 
tgacgtcaat gggagtttgt tttggcacca aaatcaacgg gactttccaa aatgtcgtaa 4680 



caactccgcc 
cagagctcgt 
ccatagaaga 
cggggatgac 
acgtcatcga 
gacttcgaag 
aggttcgaat 
atccttctct 
gggcccacca 
cattttttct 
tataacgtca 
catcgacttc 
tcgaaggttc 
tcgaatcctt 
gacctagaaa 
gcctggctag 
ttaagaccaa 
ggactggaag 
cacacacaag 
ccactgacct 
gccaatgaag 
ccggagagag 
cgagagctgc 
tccgctgggg 
agatgctgca 
ctgagcctgg 
gccttgagtg 
cctcagaccc 
agcttttgtt 
tttcctgtgt 
aagtgtaaag 
ctgcccgctt 
gcggggagag 
cgctcggtcg 
tccacagaat 
aggaaccgta 
catcacaaaa 
caggcgtttc 
ggatacctgt 
aggtatctca 
gttcagcccg 
cacgacttat 
ggcggtgcta 
tttggtatct 
tccggcaaac 
cgcagaaaaa 
tggaacgaaa 
tagatccttt 
tggtctgaca 
cgttcatcca 
ccatctggcc 
tcagcaataa 
gcctccatcc 
agtttgcgca 
atggcttcat 
tgcaaaaaag 
gtgttatcac 
agatgctttt 



ccattgacgc 
ttagtgaacc 
caccgggacc 
gtcatcgact 
cttcgaaggt 
gttcgaatcc 
ccttccagtt 
tcccaccatt 
gtcgagggct 
gaacgtcatc 
tcgacttcga 
gaaggttcga 
gaatccttcg 
ctaggcccac 
aacatggagc 
aagcacaaga 
tgacttacaa 
ggctaattca 
gctacttccc 
ttggatggtg 
gagagaacac 
aagtattaga 
atccggagta 
actttccagg 
tataagcagc 
gagctctctg 
cttcaagtag 
ttttagtcag 
ccctttagtg 
gaaattgtta 
cctggggtgc 
tccagtcggg 
gcggtttgcg 
ttcggctgcg 
caggggataa 
aaaaggccgc 
atcgacgctc 
cccctggaag 
ccgcctttct 
gttcggtgta 
accgctgcgc 
cgccactggc 
cagagttctt 
gcgctctgct 
aaaccaccgc 
aaggatctca 
actcacgtta 
taaattaaaa 
gttaccaatg 
tagttgcctg 
ccagtgctgc 
accagccagc 
agtctattaa 
acgttgttgc 
tcagctccgg 
cggttagctc 
tcatggttat 
ctgtgactgg 



aaatgggcgg 
gtcagatcgc 
gatccagcct 
tcgaaggttc 
tcgaatcctt 
ttctagattc 
ccaccagtcg 
ttttttccac 
acgtcatcga 
gacttcgaag 
aggttcgaat 
atccttcttc 
tagttcacca 
cagtcgacgc 
aatcacaagt 
ggaggaggag 
ggcagctgta 
ctcccaacga 
tgattggcag 
ctacaagcta 
ccgcttgtta 
gtggaggttt 
cttcaagaac 
gaggcgtggc 
tgctttttgc 
gctaactagg 
tgtgtgcccg 
tgtggaaaat 
agggttaatt 
tccgctcaca 
ctaatgagtg 
aaacctgtcg 
tattgggcgc 
gcgagcggta 
cgcaggaaag 
gttgctggcg 
aagtcagagg 
ctccctcgtg 
cccttcggga 
ggtcgttcgc 
cttatccggt 
agcagccact 
gaagtggtgg 
gaagccagtt 
tggtagcggt 
agaagatcct 
agggattttg 
atgaagtttt 
cttaatcagt 
actccccgtc 
aatgataccg 
cggaagggcc 
ttgttgccgg 
cattgctaca 
ttcccaacga 
cttcggtcct 
ggcagcactg 
tgagtactca 



taggcatgta 
ctggagacgc 
ccgcggcccc 
gaatccttct 
ccctgtccac 
accatttttt 
aggccaacgt 
gtcatcgact 
cttcgaaggt 
gttcgaatcc 
ccttcaccgg 
ttacaccagt 
ttttttgtgc 
atgcctgcag 
agcaatacag 
gtgggttttc 
gatcttagcc 
agacaagata 
aactacacac 
gtaccagttg 
caccctgtga 
gacagccgcc 
tgctgacatc 
ctgggcggga 
ctgtactggg 
gaacccactg 
tctgttgtgt 
ctctagcagt 
gcgcgcttgg 
attccacaca 
agctaactca 
tgccagctgc 
tcttccgctt 
tcagctcact 
aacatgtgag 
tttttccata 
tggcgaaacc 
cgctctcctg 
agcgtggcgc 
tccaagctgg 
aactatcgtc 
ggtaacagga 
cctaactacg 
accttcggaa 
ggtttttttg 
ttgatctttt 
gtcatgagat 
aaatcaatct 
gaggcaccta 
gtgtagataa 
cgagacccac 
gagcgcagaa 
gaagctagag 
ggcatcgtgg 
tcaaggcgag 
ccgatcgttg 
cataattctc 
accaagtcat 



cggtgggagg 
catccacgct 
aagcttcagc 
actgccacca 
cagtcgagta 
aggaacgtca 
catcgacttc 
tcgaaggttc 
tcgaatcctt 
ttctgctgtc 
tcaccatttt 
cgaggtacac 
acgtcatcga 
gtcgaggtcg 
cagctaccaa 
cagtcacacc 
actttttaaa 
tccttgatct 
cagggccagg 
agcaagagaa 
gcctgcatgg 
tagcatttca 
gagcttgcta 
ctggggagtg 
tctctctggt 
cttaagcctc 
gactctggta 
cgaggggggg 
cgtaatcatg 
acatacgagc 
cattaattgc 
attaatgaat 
cctcgctcac 
caaaggcggt 
caaaaggcca 
ggctccgccc 
cgacaggact 
ttccgaccct 
tttctcatag 
gctgtgtgca 
ttgagtccaa 
ttagcagagc 
gctacactag 
aaagagttgg 
tttgcaagca 
ctacggggtc 
tatcaaaaag 
aaagtatata 
tctcagcgat 
ctacgatacg 
gctcaccggc 
gtggtcctgc 
taagtagttc 
tgtcacgctc 
ttacatgatc 
tcagaagtaa 
ttactgtcat 
tctgagaata 



tctatataag 
gttttgacct 
tgctcgagcc 
ttttttctct 
ttacgtcatc 
tcgacttcga 
gaaggttcga 
gaatccttcg 
cttgcttcac 
accagtcgag 
tttataacgt 
gtcatcgact 
cttcgaaggt 
ataccgtcga 
tgctgattgt 
tcaggtacct 
agaaaagggg 
gtggatctac 
gatcagatat 
ggtagaagaa 
gatggatgac 
tcacatggcc 
caagggactt 
gcgagccctc 
tagaccagat 
aataaagctt 
actagagatc 
cccggtaccc 
gtcatagctg 
cggaagcata 
gttgcgctca 
cggccaacgc 
tgactcgctg 
aatacggtta 
gcaaaaggcc 
ccctgacgag 
ataaagatac 
gccgcttacc 
ctcacgctgt 
cgaacccccc 
cccggtaaga 
gaggtatgta 
aaggacagta 
tagctcttga 
gcagattacg 
tgacgctcag 
gatcttcacc 
tgagtaaact 
ctgtctattt 
ggagggctta 
tccagattta 
aactttatcc 
gccagttaat 
gtcgtttggt 
ccccatgttg 
gttggccgca 
gccatccgta 
gtgtatgcgg 



4740 
4800 
4860 
4920 
4980 
5040 
5100 
5160 
5220 
5280 
5340 
5400 
5460 
5520 
5580 
5640 
5700 
5760 
5820 
5880 
5940 
6000 
6060 
6120 
6180 
6240 
6300 
6360 
6420 
6480 
6540 
6600 
6660 
6720 
6780 
6840 
6900 
6960 
7020 
7080 
7140 
7200 
7260 
7320 
7380 
7440 
7500 
7560 
7620 
7680 
7740 
7800 
7860 
7920 
7980 
8040 
8100 
8160 
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cgaccgagtt gctcttgccc ggcgtcaata cgggataata ccgcgccaca tagcagaact 8220 
ttaaaagtgc tcatcattgg aaaacgttct tcggggcgaa aactctcaag gatcttaccg 8280 
ctgttgagat ccagttcgat gtaacccact cgtgcaccca actgatcttc agcatctttt 8340 
actttcacca gcgtttctgg gtgagcaaaa acaggaaggc aaaatgccgc aaaaaaggga 84 00 
ataagggcga cacggaaatg ttgaatactc atactcttcc tttttcaata ttattgaagc 8460 
atttatcagg gttattgtct catgagcgga tacatatttg aatgtattta gaaaaataaa 8520 
caaatagggg ttccgcgcac atttccccga aaagtgccac 8560 



<210> 12 

<211> 4642 

<212> DNA 

<213> Artificial Sequence 
<220> 

<223> Description of Artificial Sequence: pSYNGP2 -codon 
optimised HIV-1 gagpol with leader sequence 



<400> 12 

gggtctctct 

ctgcttaagc 

tgtgactctg 

agtggcgccc 

ctcggcttgc 

aaaaattttg 

cgggcggcga 

acaagctgaa 

ggctcctgga 

aaaccggcag 

accagcgcat 

ataagagcaa 

gccagaacta 

cccgcacgct 

tacccatgtt 

acacagtggg 

ctgccgaatg 

gtgagccacg 

ggatgaccaa 

gcctgaacaa 

cgaaggaacc 

ctagccagga 

actgcaagac 

cctgtcaggg 

aggtgaccaa 

tcgtcaagtg 

ggaaaaaggg 

gacaggctaa 

ttcagagcag 

caacaactcc 

tcagatcact 

ggctctcctg 

ctggaagccg 

gatcctcatc 

cgtcaacatc 

tagccctatc 

gcaatggcca 

aaaggaaggg 

aatcaagaag 



ggttagacca 
ctcaataaag 
gtaactagag 
gaacagggac 
tgaagcgccc 
actagcggag 
gctggaccgc 
gcacatcgtg 
gaccagcgag 
cgaggagctg 
cgaaatcaag 
aaagaaggcc 
ccccatcgtg 
gaacgcctgg 
ctcagccctg 
gggacaccag 
ggatcgtgtg 
gggctcagac 
caacccaccc 
gatcgtgcgc 
ctttcgcgac 
ggtgaagaac 
gatcctgaag 
agtgggcgga 
ctccgctacc 
cttcaactgt 
ctgttggaaa 
ttttttaggg 
accagagcca 
ctctcagaag 
ctttggcagc 
gacaccggag 
aagatgatcg 
gaaatctgcg 
atcggacgca 
gagacggtac 
ttgacagagg 
aaaatctcca 
aaggactcga 



gatctgagcc 
cttgccttga 
atccctcaga 
ctgaaagcga 
gcacggcaag 
gctagaagga 
tgggagaaga 
tgggccagcc 
gggtgccgcc 
cgcagcctgt 
gatacgaaag 
caacaggccg 
cagaacatcc 
gtgaaggtgg 
tcagagggag 
gccgccatgc 
catccggtgc 
atcgccggaa 
atcccggtgg 
atgtatagcc 
tacgtggacc 
tggatgaccg 
gccctgggcc 
cccggccaca 
atcatgatgc 
ggcaaagaag 
tgtggaaagg 
aagatctggc 
acagccccac 
caggagccga 
gacccctcgt 
cagacgacac 
ggggaatcgg 
gccacaaggc 
acctgttgac 
cggtgaagct 
agaagatcaa 
agattgggcc 
cgaaatggcg 



tgggagctct 
gtgcttcaag 
cccttttagt 
aagggaaacc 
aggcgagggg 
gagagatggg 
tccgcctgcg 
gcgaactgga 
agatcctcgg 
acaacaccgt 
aggccctgga 
ccgcggacac 
aggggcagat 
tggaagagaa 
ccacccccca 
agatgctgaa 
acgcagggcc 
cgactagtac 
gagaaatcta 
ctaccagcat 
ggttctacaa 
aaaccctgct 
cagcggctac 
aggcacgcgt 
agcgcggcaa 
ggcacacagc 
aaggacacca 
cttcccacaa 
cagaagagag 
tagacaagga 
cacaataaag 
cgtgctggag 
cggtttcatc 
tatcggtacc 
gcagatcggt 
gaagcccggg 
ggcactggtg 
tgagaacccg 
caagctggtg 



ctggctaact 
tagtgtgtgc 
cagtgtggaa 
agagctctct 
cggcgactgg 
cgcccgcgcc 
ccccggcggc 
gcgcttcgcc 
ccaactgcag 
ggccacgctg 
taaaatcgaa 
cggacacagc 
ggtgcaccag 
ggcttttagc 
agatctgaac 
ggagaccatc 
catcgcaccg 
ccttcaggaa 
caaacgctgg 
cctggacatc 
aacgctccgc 
ggtccagaac 
cctagaggaa 
cctggctgag 
ctttcggaac 
ccgcaactgc 
aatgaaagat 
gggaaggcca 
cttcaggttt 
actgtatcct 
ataggggggc 
gagatgtcgt 
aaggtgcgcc 
gtgctggtgg 
tgcacgctga 
atggacggcc 
gagatttgca 
tacaacacgc 
gacttccgcg 



agggaaccca 
ccgtctgttg 
aatctctagc 
cgacgcagga 
tgagtacgcc 
agcgtgctgt 
aaaaagaagt 
gtgaaccccg 
cccagcctgc 
tactgcgtcc 
gaggaacaga 
aaccaggtca 
gccatctccc 
ccggaggtga 
accatgctca 
aatgaggagg 
ggccagatgc 
cagatcggct 
atcatcctgg 
cgccaaggcc 
gccgagcagg 
gcgaacccgg 
atgatgaccg 
gccatgagcc 
caacgcaaga 
agggccccta 
tgtactgaga 
gggaattttc 
ggggaagaga 
ttagcttccc 
agctcaagga 
tgccaggccg 
agtatgacca 
gccccacacc 
acttccccat 
cgaaggtcaa 
cagagatgga 
cggtgttcgc 
agctgaacaa 



60 

120 

180 

240 

300 

360 

420 

480 

540 

600 

660 

720 

780 

840 

900 

960 

1020 

1080 

1140 

1200 

1260 

1320 

1380 

1440 

1500 

1560 

1620 

1680 

1740 

1800 

1860 

1920 

1980 

2040 

2100 

2160 

2220 

2280 

2340 
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gcgcacgcaa 
gaagaaatcc 
agacttcagg 
tcgatatcag 
tagcatgacc 
gtacatggat 
cgaggagctg 
gaaggagcct 
gcctatcgtg 
gaagttgaac 
cctccgcgga 
actggcagaa 
caaggacctg 
ccaggagccc 
taacgacgtc 
ctggggaaag 
gacagagtat 
ggtgaagctg 
ggatggggcc 
cagacagaag 
ttacctcgct 
cctgggcatc 
cgagcagctg 
tggcggcaat 
ggatggcatc 
ggctagcgac 
gtgtcagctc 
actcgattgc 
ctacatcgag 
gaagctggca 
cagtgctacg 
ctacaatccc 
cggccaggtc 
ccacaatttc 
catcatcgcg 
tttccgggtc 
ctggaagggt 
aagaaaggcg 
gagcagacag 



gacttctggg 
gtgaccgtac 
aagtacactg 
tacaacgtgc 
aaaatcctgg 
gacttgtacg 
cgccagcacc 
cccttcctct 
ctgccagaga 
tgggccagtc 
accaaggcac 
aaccgagaga 
atcgccgaga 
ttcaagaacc 
aagcagctga 
actcctaagt 
tggcaggcca 
tggtaccagc 
gctaacaggg 
gttgtcaccc 
ttgcaggact 
attcaagccc 
atcaagaagg 
gagcaggtcg 
gacaaggccc 
ttcaacctgc 
aagggcgaag 
acccatctgg 
gccgaggtca 
ggccggtggc 
gttaaggccg 
cagagtcagg 
agagatcagg 
aagcggaagg 
accgacatcc 
tactacaggg 
gagggggcag 
aagatcatta 
gatgaggatt 



aggttcagct 
tggatgtggg 
ccttcacaat 
tgccccaggg 
agcctttccg 
tgggctctga 
tgttgaggtg 
ggatgggtta 
aagacagctg 
agatttaccc 
tcacagaggt 
tcctaaagga 
tccagaagca 
tgaagaccgg 
ccgaggccgt 
tcaagctgcc 
cctggattcc 
tggagaagga 
agactaagct 
tcactgacac 
cgggcctgga 
agccagacca 
aaaaggtcta 
acaagctggt 
aggacgagca 
cccctgtggt 
ccatgcatgg 
agggcaaggt 
ttcccgccga 
cagtgaagac 
cctgctggtg 
gcgtcgtcga 
ctgagcatct 
gggggattgg 
agactaagga 
acagcagaaa 
tagtgatcca 
gggattatgg 
ag 



gggcatcccg 
tgatgcctac 
cccttcgatc 
ctggaaaggc 
caaacagaac 
tctagagata 
gggactgacc 
cgagctgcac 
gactgtcaac 
agggattaag 
gatcccccta 
gcccgtgcac 
ggggcaaggc 
caagtacgcc 
gcagaagatc 
catccagaag 
tgagtgggag 
gcccatagtg 
gggcaaagcc 
caccaaccag 
ggtgaacatc 
gagtgagtcc 
tctggcctgg 
ctcggctggc 
cgagaaatac 
ggccaaagag 
ccaggtggac 
tatcctggta 
aacagggcag 
catccatact 
ggcgggaatc 
gtctatgaat 
caagaccgcg 
ggggtacagt 
gctgcaaaag 
tcccctctgg 
ggataatagc 
caaacagatg 



caccccgcag 
ttctccgttc 
aacaacgaga 
tctcccgcaa 
cccgacatcg 
gggcagcacc 
acacccgaca 
cctgacaaat 
gacatacaga 
gtgaggcagc 
accgaggagg 
ggcgtgtact 
cagtggacct 
cggatgaggg 
accaccgaaa 
gaaacctggg 
ttcgtcaaca 
ggcgccgaaa 
ggatacgtca 
aagactgagc 
gtgacagact 
gagctggtca 
gtacccgccc 
atcaggaagg 
cacagcaact 
atcgtggcca 
tgtagccccg 
gccgtccatg 
gagacagcct 
gacaatggca 
aagcaggagt 
aaggagttaa 
gtccaaatgg 
gcgggggagc 
cagattacca 
aaaggcccag 
gacatcaagg 
gcgggtgatg 



ggctgaagaa 
ccctggacga 
caccggggat 
tcttccagag 
tcatctatca 
gcaccaagat 
agaagcacca 
ggaccgtgca 
agctggtggg 
tgtgcaaact 
ccgagctcga 
atgacccctc 
atcagattta 
gtgcccacac 
gcatcgtgat 
aaacctggtg 
cccctcccct 
ccttctacgt 
ctaaccgggg 
tgcaggccat 
ctcagtatgc 
atcagatcat 
acaaaggcat 
tgctattcct 
ggcgggccat 
gctgtgacaa 
gcatctggca 
tggccagtgg 
acttcctcct 
gcaatttcac 
tcgggatccc 
agaagattat 
cggtattcat 
ggatcgtgga 
agattcagaa 
cgaagctcct 
tggtgcccag 
attgcgtggc 



2400 
2460 
2520 
2580 
2640 
2700 
2760 
2820 
2880 
2940 
3000 
3060 
3120 
3180 
3240 
3300 
3360 
3420 
3480 
3540 
3600 
3660 
3720 
3780 
3840 
3900 
3960 
4020 
4080 
4140 
4200 
4260 
4320 
4380 
4440 
4500 
4560 
4620 
4642 



<210> 13 
<211> 4353 
<212> DNA 

<213> Artificial Sequence 
<220> 

<223> Description of Artificial Sequence: pSYNGP3 -codon 
optimised HIV-1 gagpol with leader sequence from 
the major splice donor 



<400> 13 

gtgagtacgc 

cagcgtgctg 

caaaaagaag 

cgtgaacccc 

gcccagcctg 

gtactgcgtc 



caaaaatttt 
tcgggcggcg 
tacaagctga 
gggctcctgg 
caaaccggca 
caccagcgca 



gactagcgga 
agctggaccg 
agcacatcgt 
agaccagcga 
gcgaggagct 
tcgaaatcaa 



ggctagaagg 
ctgggagaag 
gtgggccagc 

ggggtgccgc 

gcgcagcctg 
ggatacgaaa 



agagagatgg 
atccgcctgc 
cgcgaactgg 
cagatcctcg 
tacaacaccg 
gaggccctgg 



gcgcccgcgc 60 
gccccggcgg 12 0 
agcgcttcgc 180 
gccaactgca 24 0 
tggccacgct 300 
ataaaatcga 360 
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agaggaacag 
caaccaggtc 
ggccatctcc 
cccggaggtg 
caccatgctc 
caatgaggag 
gggccagatg 
acagatcggc 
gatcatcctg 
ccgccaaggc 
cgccgagcag 
cgcgaacccg 
aatgatgacc 
ggccatgagc 
ccaacgcaag 
cagggcccct 
ttgtactgag 
agggaatttt 
tggggaagag 
tttagcttcc 
cagctcaagg 
ttgccaggcc 
cagtatgacc 
ggccccacac 
aacttcccca 
ccgaaggtca 
acagagatgg 
ccggtgttcg 
gagctgaaca 
gggctgaaga 
cccctggacg 
acaccgggga 
atcttccaga 
gtcatctatc 
cgcaccaaga 
aagaagcacc 
tggaccgtgc 
aagctggtgg 
ctgtgcaaac 
gccgagctcg 
tatgacccct 
tatcagattt 
ggtgcccaca 
agcatcgtga 
gaaacctggt 
acccctcccc 
accttctacg 
actaaccggg 
ctgcaggcca 
tctcagtatg 
aatcagatca 
cacaaaggca 
gtgctattcc 
tggcgggcca 
agctgtgaca 
ggcatctggc 
gtggccagtg 
tacttcctcc 



aataagagca 
agccagaact 
ccccgcacgc 
atacccatgt 
aacacagtgg 
gctgccgaat 
cgtgagccac 
tggatgacca 
ggcctgaaca 
ccgaaggaac 
gctagccagg 
gactgcaaga 
gcctgtcagg 
caggtgacca 
atcgtcaagt 
aggaaaaagg 
agacaggcta 
cttcagagca 
acaacaactc 
ctcagatcac 
aggctctcct 
gctggaagcc 
agatcctcat 
ccgtcaacat 
ttagccctat 
agcaatggcc 
aaaaggaagg 
caatcaagaa 
agcgcacgca 
agaagaaatc 
aagacttcag 
ttcgatatca 
gtagcatgac 
agtacatgga 
tcgaggagct 
agaaggagcc 
agcctatcgt 
ggaagttgaa 
tcctccgcgg 
aactggcaga 
ccaaggacct 
accaggagcc 
ctaacgacgt 
tctggggaaa 
ggacagagta 
tggtgaagct 
tggatggggc 
gcagacagaa 
tttacctcgc 
ccctgggcat 
tcgagcagct 
ttggcggcaa 
tggatggcat 
tggctagcga 
agtgtcagct 
aactcgattg 
gctacatcga 
tgaagctggc 



aaaagaaggc 
accccatcgt 
tgaacgcctg 
tctcagccct 
ggggacacca 
gggatcgtgt 
ggggctcaga 
acaacccacc 
agatcgtgcg 
cctttcgcga 
aggtgaagaa 
cgatcctgaa 
gagtgggcgg 
actccgctac 
gcttcaactg 
gctgttggaa 
attttttagg 
gaccagagcc 
cctctcagaa 
tctttggcag 
ggacaccgga 
gaagatgatc 
cgaaatctgc 
catcggacgc 
cgagacggta 
attgacagag 
gaaaatctcc 
gaaggactcg 
agacttctgg 
cgtgaccgta 
gaagtacact 
gtacaacgtg 
caaaatcctg 
tgacttgtac 
gcgccagcac 
tcccttcctc 
gctgccagag 
ctgggccagt 
aaccaaggca 
aaaccgagag 
gatcgccgag 
cttcaagaac 
caagcagctg 
gactcctaag 
ttggcaggcc 
gtggtaccag 
cgctaacagg 
ggttgtcacc 
tttgcaggac 
cattcaagcc 
gatcaagaag 
tgagcaggtc 
cgacaaggcc 
cttcaacctg 
caagggcgaa 
cacccatctg 
ggccgaggtc 
aggccggtgg 



ccaacaggcc 
gcagaacatc 
ggtgaaggtg 
gtcagaggga 
ggccgccatg 
gcatccggtg 
catcgccgga 
catcccggtg 
catgtatagc 
ctacgtggac 
ctggatgacc 
ggccctgggc 
acccggccac 
catcatgatg 
tggcaaagaa 
atgtggaaag 
gaagatctgg 
aacagcccca 
gcaggagccg 
cgacccctcg 
gcagacgaca 
gggggaatcg 
ggccacaagg 
aacctgttga 
ccggtgaagc 
gagaagatca 
aagattgggc 
acgaaatggc 
gaggttcagc 
ctggatgtgg 
gccttcacaa 
ctgccccagg 
gagcctttcc 
gtgggctctg 
ctgttgaggt 
tggatgggtt 
aaagacagct 
cagatttacc 
ctcacagagg 
atcctaaagg 
atccagaagc 
ctgaagaccg 
accgaggccg 
ttcaagctgc 
acctggattc 
ctggagaagg 
gagactaagc 
ctcactgaca 
tcgggcctgg 
cagccagacc 
gaaaaggtct 
gacaagctgg 
caggacgagc 
ccccctgtgg 
gccatgcatg 
gagggcaagg 
attcccgccg 
ccagtgaaga 



gccgcggaca 
caggggcaga 
gtggaagaga 
gccacccccc 
cagatgctga 
cacgcagggc 
acgactagta 
ggagaaatct 
cctaccagca 
cggttctaca 
gaaaccctgc 
ccagcggcta 
aaggcacgcg 
cagcgcggca 
gggcacacag 
gaaggacacc 
ccttcccaca 
ccagaagaga 
atagacaagg 
tcacaataaa 
ccgtgctgga 
gcggtttcat 
ctatcggtac 
cgcagatcgg 
tgaagcccgg 
aggcactggt 
ctgagaaccc 
gcaagctggt 

tgggcatccc 

gtgatgccta 
tcccttcgat 
gctggaaagg 
gcaaacagaa 
atctagagat 
ggggactgac 
acgagctgca 
ggactgtcaa 
cagggattaa 
tgatccccct 
agcccgtgca 
aggggcaagg 
gcaagtacgc 
tgcagaagat 
ccatccagaa 
ctgagtggga 
agcccatagt 
tgggcaaagc 
ccaccaacca 
aggtgaacat 
agagtgagtc 
atctggcctg 
tctcggctgg 
acgagaaata 
tggccaaaga 
gccaggtgga 
ttatcctggt 
aaacagggca 
ccatccatac 



ccggacacag 
tggtgcacca 
aggcttttag 
aagatctgaa 
aggagaccat 
ccatcgcacc 
cccttcagga 
acaaacgctg 
tcctggacat 
aaacgctccg 
tggtccagaa 
ccctagagga 
tcctggctga 
actttcggaa 
cccgcaactg 
aaatgaaaga 
agggaaggcc 
gcttcaggtt 
aactgtatcc 
gatagggggg 
ggagatgtcg 
caaggtgcgc 
cgtgctggtg 
ttgcacgctg 
gatggacggc 
ggagatttgc 
gtacaacacg 
ggacttccgc 
gcaccccgca 
cttctccgtt 
caacaacgag 
ctctcccgca 
ccccgacatc 
agggcagcac 
cacacccgac 
ccctgacaaa 
cgacatacag 
ggtgaggcag 
aaccgaggag 
cggcgtgtac 
ccagtggacc 
ccggatgagg 
caccaccgaa 
ggaaacctgg 
gttcgtcaac 
gggcgccgaa 
cggatacgtc 
gaagactgag 
cgtgacagac 
cgagctggtc 
ggtacccgcc 
catcaggaag 
ccacagcaac 
gatcgtggcc 
ctgtagcccc 
agccgtccat 
ggagacagcc 
tgacaatggc 



420 

480 

540 

600 

660 

720 

780 

840 

900 

960 

1020 

1080 

1140 

1200 

1260 

1320 

1380 

1440 

1500 

1560 

1620 

1680 

1740 

1800 

1860 

1920 

1980 

2040 

2100 

2160 

2220 

2280 

2340 

2400 

2460 

2520 

2580 

2640 

2700 

2760 

2820 

2880 

2940 

3000 

3060 

3120 

3180 

3240 

3300 

3360 

3420 

3480 

3540 

3600 

3660 

3720 

3780 

3840 
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agcaatttca ccagtgctac ggttaaggcc gcctgctggt gggcgggaat caagcaggag 3 900 
ttcgggatcc cctacaatcc ccagagtcag ggcgtcgtcg agtctatgaa taaggagtta 3960 
aagaagatta tcggccaggt cagagatcag gctgagcatc tcaagaccgc ggtccaaatg 4020 
gcggtattca tccacaattt caagcggaag ggggggattg gggggtacag tgcgggggag 4 0 80 
cggatcgtgg acatcatcgc gaccgacatc cagactaagg agctgcaaaa gcagattacc 4140 
aagattcaga atttccgggt ctactacagg gacagcagaa atcccctctg gaaaggccca 4200 
gcgaagctcc tctggaaggg tgagggggca gtagtgatcc aggataatag cgacatcaag 42 60 
gtggtgccca gaagaaaggc gaagatcatt agggattatg gcaaacagat ggcgggtgat 4320 
gattgcgtgg cgagcagaca ggatgaggat tag 4353 



<210> 14 
<211> 4327 
<212> DNA 

<213> Artificial Sequence 
<220> 

<223> Description of Artificial Sequence: pSYNGP4 -codon 
optimised HIV-1 gagpol with 2 0bp of the leader 
sequence of HIV-1 



<400> 14 

cggaggctag 

accgctggga 

tcgtgtgggc 

gcgaggggtg 

agctgcgcag 

tcaaggatac 

aggcccaaca 

tcgtgcagaa 

cctgggtgaa 

ccctgtcaga 

accaggccgc 

gtgtgcatcc 

cagacatcgc 

cacccatccc 

tgcgcatgta 

gcgactacgt 

agaactggat 

tgaaggccct 

gcggacccgg 

ctaccatcat 

actgtggcaa 

ggaaatgtgg 

tagggaagat 

agccaacagc 

agaagcagga 

gcagcgaccc 

cggagcagac 

gatcggggga 

ctgcggccac 

acgcaacctg 

ggtaccggtg 

agaggagaag 

ctccaagatt 

ctcgacgaaa 

ctgggaggtt 

cgtactggat 



aaggagagag 
gaagatccgc 
cagccgcgaa 
ccgccagatc 
cctgtacaac 
gaaagaggcc 
ggccgccgcg 
catccagggg 

ggtggtggaa 

gggagccacc 
catgcagatg 
ggtgcacgca 
cggaacgact 
ggtgggagaa 
tagccctacc 
ggaccggttc 
gaccgaaacc 
gggcccagcg 
ccacaaggca 
gatgcagcgc 
agaagggcac 
aaaggaagga 
ctggccttcc 
cccaccagaa 
gccgatagac 
ctcgtcacaa 
gacaccgtgc 
atcggcggtt 
aaggctatcg 
ttgacgcaga 
aagctgaagc 
atcaaggcac 
gggcctgaga 
tggcgcaagc 
cagctgggca 
gtgggtgatg 



atgggcgccc 
ctgcgccccg 
ctggagcgct 
ctcggccaac 
accgtggcca 
ctggataaaa 
gacaccggac 
cagatggtgc 
gagaaggctt 
ccccaagatc 
ctgaaggaga 
gggcccatcg 
agtacccttc 
atctacaaac 
agcatcctgg 
tacaaaacgc 
ctgctggtcc 
gctaccctag 
cgcgtcctgg 
ggcaactttc 
acagcccgca 
caccaaatga 
cacaagggaa 
gagagcttca 
aaggaactgt 
taaagatagg 
tggaggagat 
tcatcaaggt 
gtaccgtgct 
tcggttgcac 
ccgggatgga 
tggtggagat 
acccgtacaa 

tggtggactt 

tcccgcaccc 
cctacttctc 



gcgccagcgt 
gcggcaaaaa 
tcgccgtgaa 
tgcagcccag 
cgctgtactg 
tcgaagagga 
acagcaacca 
accaggccat 
ttagcccgga 
tgaacaccat 
ccatcaatga 
caccgggcca 
aggaacagat 
gctggatcat 
acatccgcca 
tccgcgccga 
agaacgcgaa 
aggaaatgat 
ctgaggccat 
ggaaccaacg 
actgcagggc 
aagattgtac 
ggccagggaa 
ggtttgggga 
atcctttagc 
9999cagctc 
gtcgttgcca 
gcgccagtat 
ggtgggcccc 
gctgaacttc 
cggcccgaag 
ttgcacagag 
cacgccggtg 
ccgcgagctg 
cgcagggctg 
cgttcccctg 



gctgtcgggc 
gaagtacaag 
ccccgggctc 
cctgcaaacc 
cgtccaccag 
acagaataag 
ggtcagccag 
ctccccccgc 
ggtgataccc 
gctcaacaca 
ggaggctgcc 
gatgcgtgag 
cggctggatg 
cctgggcctg 
aggcccgaag 
gcaggctagc 
cccggactgc 
gaccgcctgt 
gagccaggtg 
caagatcgtc 
ccctaggaaa 
tgagagacag 
ttttcttcag 
agagacaaca 
ttccctcaga 
aaggaggctc 
ggccgctgga 
gaccagatcc 
acacccgtca 
cccattagcc 
gtcaagcaat 
atggaaaagg 
ttcgcaatca 
aacaagcgca 
aagaagaaga 
gacgaagact 



ggcgagctgg 
ctgaagcaca 
ctggagacca 
ggcagcgagg 
cgcatcgaaa 
agcaaaaaga 
aactacccca 
acgctgaacg 
atgttctcag 
gtggggggac 
gaatgggatc 
ccacggggct 
accaacaacc 
aacaagatcg 
gaaccctttc 
caggaggtga 
aagacgatcc 
cagggagtgg 
accaactccg 
aagtgcttca 
aagggctgtt 
gctaattttt 
agcagaccag 
actccctctc 
tcactctttg 
tcctggacac 
agccgaagat 
tcatcgaaat 
acatcatcgg 
ctatcgagac 
ggccattgac 
aagggaaaat 
agaagaagga 
cgcaagactt 
aatccgtgac 
tcaggaagta 



60 

120 

180 

240 

300 

360 

420 

480 

540 

600 

660 

720 

780 

840 

900 

960 

1020 

1080 

1140 

1200 

1260 

1320 

1380 

1440 

1500 

1560 

1620 

1680 

1740 

1800 

1860 

1920 

1980 

2040 

2100 

2160 
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cactgccttc 
cgtgctgccc 
cctggagcct 
gtacgtgggc 
gcacctgttg 
cctctggatg 
agagaaagac 
cagtcagatt 
ggcactcaca 
agagatccta 
cgagatccag 
gaacctgaag 
gctgaccgag 
taagttcaag 
ggccacctgg 
ccagctggag 
cagggagact 
caccctcact 
ggactcgggc 
agcccagcca 
gaaggaaaag 
ggtcgacaag 
ggcccaggac 
cctgccccct 
cgaagccatg 
tctggagggc 
ggtcattccc 
gtggccagtg 
ggccgcctgc 
tcagggcgtc 
tcaggctgag 
gaaggggggg 
catccagact 
cagggacagc 
ggcagtagtg 
cattagggat 
ggattag 



acaatccctt 
cagggctgga 
ttccgcaaac 
tctgatctag 
aggtggggac 
ggttacgagc 
agctggactg 
tacccaggga 
gaggtgatcc 
aaggagcccg 
aagcaggggc 
accggcaagt 
gccgtgcaga 
ctgcccatcc 
attcctgagt 
aaggagccca 
aagctgggca 
gacaccacca 
ctggaggtga 
gaccagagtg 
gtctatctgg 
ctggtctcgg 
gagcacgaga 
gtggtggcca 
catggccagg 
aaggttatcc 
gccgaaacag 
aagaccatcc 
tggtgggcgg 
gtcgagtcta 
catctcaaga 
attggggggt 
aaggagctgc 
agaaatcccc 
atccaggata 
tatggcaaac 



cgatcaacaa 
aaggctctcc 
agaaccccga 
agatagggca 
tgaccacacc 
tgcaccctga 
tcaacgacat 
ttaaggtgag 
ccctaaccga 
tgcacggcgt 
aaggccagtg 
acgcccggat 
agatcaccac 
agaaggaaac 
gggagttcgt 
tagtgggcgc 
aagccggata 
accagaagac 
acatcgtgac 
agtccgagct 
cctgggtacc 
ctggcatcag 
aataccacag 
aagagatcgt 
tggactgtag 
tggtagccgt 

99 ca 99 a 9 ac 
atactgacaa 
gaatcaagca 
tgaataagga 
ccgcggtcca 
acagtgcggg 
aaaagcagat 
tctggaaagg 
atagcgacat 
agatggcggg 



cgagacaccg 
cgcaatcttc 
catcgtcatc 
gcaccgcacc 
cgacaagaag 
caaatggacc 
acagaagctg 
gcagctgtgc 
ggaggccgag 
gtactatgac 
gacctatcag 
gaggggtgcc 
cgaaagcatc 
ctgggaaacc 
caacacccct 
cgaaaccttc 
cgtcactaac 
tgagctgcag 
agactctcag 
ggtcaatcag 
cgcccacaaa 
gaaggtgcta 
caactggcgg 
ggccagctgt 
ccccggcatc 
ccatgtggcc 
agcctacttc 
tggcagcaat 
ggagttcggg 
gttaaagaag 
aatggcggta 
ggagcggatc 
taccaagatt 
cccagcgaag 
caaggtggtg 
tgatgattgc 



gggattcgat 
cagagtagca 
tatcagtaca 
aagatcgagg 
caccagaagg 
gtgcagccta 

gtggggaagt 

aaactcctcc 
ctcgaactgg 
ccctccaagg 
atttaccagg 
cacactaacg 
gtgatctggg 
tggtggacag 
cccctggtga 
tacgtggatg 
cggggcagac 
gccatttacc 
tatgccctgg 
atcatcgagc 
ggcattggcg 
ttcctggatg 
gccatggcta 
gacaagtgtc 
tggcaactcg 
agtggctaca 
ctcctgaagc 
ttcaccagtg 
atcccctaca 
attatcggcc 
ttcatccaca 
gtggacatca 
cagaatttcc 
ctcctctgga 
cccagaagaa 
gtggcgagca 



atcagtacaa 
tgaccaaaat 
tggatgactt 
agctgcgcca 
agcctccctt 
tcgtgctgcc 
tgaactgggc 
gcggaaccaa 
cagaaaaccg 
acctgatcgc 
agcccttcaa 
acgtcaagca 
gaaagactcc 
agtattggca 
agctgtggta 
gggccgctaa 
agaaggttgt 
tcgctttgca 
gcatcattca 
agctgatcaa 
gcaatgagca 
gcatcgacaa 
gcgacttcaa 
agctcaaggg 
attgcaccca 
tcgaggccga 
tggcaggccg 
ctacggttaa 
atccccagag 
aggtcagaga 
atttcaagcg 
tcgcgaccga 
gggtctacta 
agggtgaggg 
aggcgaagat 
gacaggatga 



2220 
2280 
2340 
2400 
2460 
2520 
2580 
2640 
2700 
2760 
2820 
2880 
2940 
3000 
3060 
3120 
3180 
3240 
3300 
3360 
3420 
3480 
3540 
3600 
3660 
3720 
3780 
3840 
3900 
3960 
4020 
4080 
4140 
4200 
4260 
4320 
4327 



<210> 15 

<211> 22 

<212> RNA 

<213> Artificial Sequence 
<220> 

<223> Description of Artificial Sequence: Illustrative 
helix II sequence 

<400> 15 

cugaugaggc cgaaaggccg aa 22 



<210> 16 

<211> 22 

<212> RNA 

<213> Human immunodeficiency virus type 1 
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<400> 16 

uaguaagaau guauagcccu ac 



<210> 17 
<211> 22 
<212> RNA 

<213> Human immunodeficiency virus type 1 
<400> 17 

aacccagauu guaagacuau uu 



<210> 18 
<211> 22 
<212> RNA 

<213> Human immunodeficiency virus type 1 
<400> 18 

uguuucaauu guggcaaaga ag 



<210> 19 
<211> 22 
<212> RNA 

<213> Human immunodeficiency virus type 1 
<400> 19 

aaaaagggcu guuggaaaug ug 



<210> 20 
<211> 22 
<212> RNA 

<213> Human immunodeficiency virus type 1 
<400> 20 

acgaccccuc gucacaauaa ag 



<210> 21 
<211> 22 
<212> RNA 

<213> Human immunodeficiency virus type 1 
<400> 21 

ggaauuggag guuuuaucaa ag 



<210> 22 

<211> 22 

<212> RNA 

<213> Human immunodeficiency virus type 1 



<400> 22 

auauuuuuca guucccuuag au 
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<210> 23 
<211> 22 
<212> RNA 

<213> Human immunodeficiency .virus type 
<400> 23 

uggaugauuu guauguagga uc 



<210> 24 
<211> 22 
<212> RNA 

<213> Human immunodeficiency virus type 
<400> 24 

cuuuggaugg guuaugaacu cc 



<210> 25 
<211> 22 
<212> RNA 

<213> Human immunodeficiency virus type 
<400> 25 

cagcuggacu gucaaugaca ua 



<210> 26 
<211> 22 
<212> RNA 

<213> Human immunodeficiency virus type 
<400> 26 

aacuuucuau guagaugggg ca 



<210> 27 
<211> 22 
<212> RNA 

<213> Human immunodeficiency virus type 
<400> 27 

aaggccgccu guuggugggc ag 



<210> 28 
<211> 22 
<212> RNA 

<213> Human immunodeficiency virus type 
<400> 28 

uaagacagca guacaaaugg ca 



<210> 29 
<211> 30 
<212> DNA 

<213> Artificial Sequence 
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<220> 

<223> Description of Artificial Sequence: Primer 
<400> 29 

cagctgctcg agcagctgaa gcttgcatgc 3 0 



<210> 30 

<211> 34 

<212> DNA 

<213> Artificial 



Sequence 



<220> 

<223> Description of Artificial Sequence: Primer 
<400> 30 

gtaagttatg taacggacga tatcttgtct tctt 34 



01 <220> 



<210> 31 

<211> 37 

<212> DNA 

<213> Artificial Sequence 



<223> Description of Artificial Sequence: Primer 
<400> 31 

cgcatagtcg acgggcccgc cactgctaga gattttc 3 7 



<210> 32 

<211> 116 

<212> DNA 

<213> Artificial Sequence 
<220> 

<223> Description of Artificial Sequence: Synthetic 
oligonucleotide 



<400> 32 

tcgaggtcga ctggtggaca gggaaggatt cgaaccttcg aagtcgatga cgtagagaaa 60 
aaatggtggc agtagaagga ttcgaacctt cgaagtcgat gacgtcatcc ccgggc 116 

<210> 33 
<211> 110 
<212> DNA 

<213> Artificial Sequence 
<220> 

<223> Description of Artificial Sequence: Synthetic 
oligonucleotide 



<400> 33 

tcgaggtcga ctggtggaac tggaaggatt cgaaccttcg aagtcgatga cgttcctaaa 60 
aaatggtgaa tcatgaagga ttcgaacctt cgaagtcgat gacgtaatac 110 
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<210> 34 
<211> 110 
<212> DNA 

<213> Artificial Sequence 
<220> 

<223> Description of Artificial Sequence: Synthetic 
oligonucleotide 

<400> 34 

tcgaggtcga ctggtgggcc ccgaaggatt cgaaccttcg aagtcgatga cgtggaaaaa 60 
aaatggtggg aagagaagga ttcgaacctt cgaagtcgat gacgttggcc 110 



□ 

w 



n 3 



<210> 35 
<211> 110 
<212> DNA 

<213> Artificial Sequence 
<220> 

<223> Description of Artificial Sequence: Synthetic 
oligonucleotide 

<400> 35 

tcgaggtcga ctggtgacag cagaaggatt cgaaccttcg aagtcgatga cgttcagaaa 60 
aaatggtgaa gcaagaagga ttcgaacctt cgaagtcgat gacgtagccc 110 



<210> 36 
<211> 110 
<212> DNA 

<213> Artificial Sequence 
<220> 

<223> Description of Artificial Sequence: Synthetic 
oligonucleotide 

<400> 36 

tcgaggtcga ctggtgtaag aagaaggatt cgaaccttcg aagtcgatga cgttataaaa 60 
aaatggtgac cggtgaagga ttcgaacctt cgaagtcgat gacgttatac 110 



<210> 37 
<211> 116 
<212> DNA 

<213> Artificial Sequence 
<220> 

<223> Description of Artificial Sequence: Synthetic 
oligonucleotide 

<400> 37 

tcgaggcatg cgtcgactgg tgggcctaga aggattcgaa ccttcgaagt cgatgacgtg 60 
cacaaaaaat ggtgaactac gaaggattcg aaccttcgaa gtcgatgacg tgtacc 116 
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<210> 38 
<211> 12 
<212> DNA 

<213> Human immunodeficiency virus type 1 

<400> 38 
atgggtgcga ga 

<210> 39 
<211> 12 
<212> DNA 

<213> Human immunodeficiency virus type 1 

<400> 39 
gatgaggatt ag 

<210> 40 
<211> 12 
<212> DNA 

<213> Artificial Sequence 
<220> 

<223> Description of Artificial Sequence: 

gagpol-SYNgp-codon optimised gagpol sequence 

<400> 40 
atgggcgccc gc 

<210> 41 
<211> 12 
<212> DNA 

<213> Artificial Sequence 
<220> 

<223> Description of Artificial Sequence: 

gagpol-SYNgp-codon optimised gagpol sequence 

<400> 41 
gatgaggatt ag 

<210> 42 
<211> 12 
<212> DNA 

<213> Human immunodeficiency virus type 1 

<400> 42 
atgagagtga ag 

<210> 43 
<211> 12 
<212> DNA 

<213> Human immunodeficiency virus type 1 



hi 



RJ 



ru 
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<400> 43 

gctttgctat aa 12 



<210> 44 
<211> 12 
<212> DNA 

<213> Artificial Sequence 
<220> 

<223> Description of Artificial Sequence: 

SYNgp-160nm-codon optimised env sequence 

<400> 44 

atgagggtga ag 12 



<210> 45 

<211> 12 

<212> DNA 

<213> Artificial Sequence 
<220> 

<223> Description of Artificial Sequence: 

SYNgp - 160nm- codon optimised env sequence 



LH <400> 45 



gcgctgctgt aa 12 



<210> 46 
<211> 34 
<212> RNA 

<213> Human immunodeficiency virus type 1 
<400> 46 

ggcucgaacu ugucgugguu aucguggaug uguc 34 



<210> 47 
<211> 63 
<212> RNA 

<213> Artificial Sequence 
<220> 

<223> Description of Artificial Sequence: EGS based on 
Tyro sol t -RNA 

<400> 47 

cgauagcaga cucuaaaucu gccgucaucg acuucgaagg uucgaauccu ucccaggaca 60 
cca 63 



<210> 48 

<211> 66 

<212> RNA 

<213> Artificial Sequence 
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<220> 

<223> Description of Artificial Sequence: Consensus EGS 
sequence 

<220> 

<221> modif ied_base 

<222> (1) . . (7) 

<223> Any nucleotide 

<220> 

<221> modif ied_base 
<222> (56) . . (61) 
<223> Any nucleotide 

<400> 48 

nnnnnnnagc agacucuaaa ucugccguca ucgacuucga agguucgaau ccuucnnnnn 60 
ncacca 66 



5 * 



m 



<210> 49 

<211> 49 

<212> RNA 

<213> Artificial Sequence 
<220> 

<223> Description of Artificial Sequence: 
sequence 



Consensus EGS 



ry 



<220> 

<221> modif ied_base 

<222> (1) . . (7) 

<223> Any nucleotide 

<220> 

<221> modif ied_base 
<222> (39) . . (44) 
<223> Any nucleotide 



<400> 49 

nnnnnnnacg ucaucgacuu cgaagguucg aauccuucnn nnnncacca 



49 



<210> 50 

<211> 13 

<212> RNA 

<213> Human immunodeficiency virus type 1 



<400> 50 
gggccuauag cac 



13 



<210> 51 

<211> 13 

<212> RNA 

<213> Human immunodeficiency virus type 1 



<400> 51 
gaacuacuag uac 



13 
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<210> 52 
<211> 13 
<212> RNA 

<213> Human immunodeficiency virus type 1 

<400> 52 
guaagaaugu aua 

<210> 53 
<211> 13 
<212> RNA 

<213> Human immunodeficiency virus type 1 

<400> 53 
gaccgguucu aua 

<210> 54 
<211> 13 
<212> RNA 

<213> Human immunodeficiency virus type 1 

<400> 54 
gacagcaugu cag 

<210> 55 
<211> 13 
<212> RNA 

<213> Human immunodeficiency virus type 1 

<400> 55 
gaagcaauga gcc 

<210> 56 
<211> 13 
<212> RNA 

<213> Human immunodeficiency virus type 1 

<400> 56 
gggccccuag gaa 

<210> 57 
<211> 13 
<212> RNA 

<213> Human immunodeficiency virus type 1 

<400> 57 
gggaagaucu ggc 

<210> 58 
<211> 13 
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<212> RNA 

<213> Human immunodeficiency virus type 1 

<400> 58 
ggaacuguau ecu 



<210> 59 
<211> 13 
<212> RNA 

<213> Human immunodeficiency virus type 1 

<400> 59 
gaaucuauga aua 



<210> 60 
<211> 13 
<212> RNA 

<213> Human immunodeficiency virus type 1 

<400> 60 
ggacagguaa gag 



<210> 61 
<211> 13 
<212> RNA 

<213> Human immunodeficiency virus type 1 

<400> 61 
ggcaguauuc auc 



<210> 62 
<211> 46 
<212> DNA 

<213> Artificial Sequence 
<220> 

<223> Description of Combined DNA/ RNA Molecule: Anti-HIV 
EGS construct 

<220> 

<223> Description of Artificial Sequence: Anti-HIV EGS 
construct 

<400> 62 

gtgeacguca ucgacuuega agguuegaau ccuucuaggc ccacca 



<210> 63 

<211> 46 

<212> DNA 

<213> Artificial 



Sequence 
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<220> 

<223> Description of Combined DNA/RNA Molecule: Anti-HIV 
EGS construct 

<220> 

<223> Description of Artificial Sequence: Anti-HIV EGS 
construct 

<400> 63 

gtacacguca ucgacuucga agguucgaau ccuucguagu ucacca 



<210> 64 

<211> 46 

<212> RNA 

<213> Artificial 



Sequence 



<220> 

<223> Description of Artificial Sequence: Anti-HIV EGS 
construct 

<400> 64 

uauaacguca ucgacuucga agguucgaau ccuucuucuu acacca 



<210> 65 
<211> 46 
<212> RNA 

<213> Artificial Sequence 



<220> 

<223> Description of Artificial Sequence: Anti-HIV EGS 
construct 

<400> 65 

uauaacguca ucgacuucga agguucgaau ccuucaccgg ucacca 



<210> 66 

<211> 46 

<212> RNA 

<213> Artificial Sequence 
<220> 

<223> Description of Artificial Sequence: Anti-HIV EGS 
construct 

<400> 66 

cugaacguca ucgacuucga agguucgaau ccuucugcug ucacca 



<210> 67 

<211> 46 

<212> RNA 

<213> Artificial 



Sequence 



25 



<220> 

<223> Description of Artificial Sequence: Anti-HIV EGS 
construct 

<400> 67 

ggcuacguca ucgacuucga agguucgaau ccuucuugcu ucacca 



<210> 68 
<211> 46 
<212> DNA 

<213> Artificial Sequence 
<220> 

<223> Description of Combined DNA/RNA Molecule: Anti-HIV 
EGS construct 

<220> 

<223> Description of Artificial Sequence: Anti-HIV EGS 
construct 

<400> 68 

ttccacguca ucgacuucga agguucgaau ccuucggggc ccacca 



<210> 69 
<211> 46 
<212> RNA 

<213> Artificial Sequence 
<220> 

<223> Description of Artificial Sequence: Anti-HIV EGS 
construct 

<400> 69 

gccaacguca ucgacuucga agguucgaau ccuucucuuc ccacca 



<210> 70 
<211> 46 
<212> RNA 

<213> Artificial Sequence 
<220> 

<223> Description of Artificial Sequence: Anti-HIV EGS 
construct 

<400> 70 

aggaacguca ucgacuucga agguucgaau ccuuccaguu ccacca 



<210> 71 

<211> 46 

<212> RNA 

<213> Artificial Sequence 




t 



26 



<220> 

<223> Description of Artificial Sequence: Anti-HIV EGS 
construct 



<400> 71 



uauuacguca ucgacuucga agguucgaau ccuucuagau ucacca 



46 



<210> 72 

<211> 46 

<212> RNA 

<213> Artificial Sequence 
<220> 

<223> Description of Artificial Sequence: Anti-HIV EGS 
construct 

<400> 72 

cucuacguca ucgacuucga agguucgaau ccuucccugu ccacca 4 6 



UJ 



<210> 
<211> 
<212> 
<213> 



Artificial Sequence 



73 
46 
RNA 



HI 



<220> 
<223> 



Description of Artificial Sequence: Anti-HIV EGS 
construct 



fli 



<400> 



73 



gaugacguca ucgacuucga agguucgaau ccuucuacug ccacca 



46 



